Exploratory Data Analysis
# Set Seed to Save Models:
set.seed(1)
# check head of dataframe:
head(data, n = 10)
## MS.Zoning Lot.Frontage Lot.Area Street Alley Lot.Shape Land.Contour
## 1 RL 141 31770 Pave None IR1 Lvl
## 2 RH 80 11622 Pave None Reg Lvl
## 3 RL 81 14267 Pave None IR1 Lvl
## 4 RL 93 11160 Pave None Reg Lvl
## 5 RL 74 13830 Pave None IR1 Lvl
## 6 RL 78 9978 Pave None IR1 Lvl
## 7 RL 41 4920 Pave None Reg Lvl
## 8 RL 43 5005 Pave None IR1 HLS
## 9 RL 39 5389 Pave None IR1 Lvl
## 10 RL 60 7500 Pave None Reg Lvl
## Lot.Config Land.Slope Condition.1 Condition.2 Bldg.Type House.Style
## 1 Corner Gtl Norm Norm 1Fam 1Story
## 2 Inside Gtl Feedr Norm 1Fam 1Story
## 3 Corner Gtl Norm Norm 1Fam 1Story
## 4 Corner Gtl Norm Norm 1Fam 1Story
## 5 Inside Gtl Norm Norm 1Fam 2Story
## 6 Inside Gtl Norm Norm 1Fam 2Story
## 7 Inside Gtl Norm Norm TwnhsE 1Story
## 8 Inside Gtl Norm Norm TwnhsE 1Story
## 9 Inside Gtl Norm Norm TwnhsE 1Story
## 10 Inside Gtl Norm Norm 1Fam 2Story
## Overall.Qual Overall.Cond Year.Built Year.Remod.Add Roof.Style Roof.Matl
## 1 6 5 1960 1960 Hip CompShg
## 2 5 6 1961 1961 Gable CompShg
## 3 6 6 1958 1958 Hip CompShg
## 4 7 5 1968 1968 Hip CompShg
## 5 5 5 1997 1998 Gable CompShg
## 6 6 6 1998 1998 Gable CompShg
## 7 8 5 2001 2001 Gable CompShg
## 8 8 5 1992 1992 Gable CompShg
## 9 8 5 1995 1996 Gable CompShg
## 10 7 5 1999 1999 Gable CompShg
## Exterior.1st Exterior.2nd Mas.Vnr.Type Mas.Vnr.Area Exter.Qual Exter.Cond
## 1 BrkFace Plywood Stone 112 TA TA
## 2 VinylSd VinylSd None 0 TA TA
## 3 Wood wood BrkFace 108 TA TA
## 4 BrkFace BrkFace None 0 Gd TA
## 5 VinylSd VinylSd None 0 TA TA
## 6 VinylSd VinylSd BrkFace 20 TA TA
## 7 CemntBd CmentBd None 0 Gd TA
## 8 HdBoard HdBoard None 0 Gd TA
## 9 CemntBd CmentBd None 0 Gd TA
## 10 VinylSd VinylSd None 0 TA TA
## Foundation Bsmt.Qual Bsmt.Cond Bsmt.Exposure BsmtFin.Type.1 BsmtFin.SF.1
## 1 CBlock TA Gd Gd BLQ 639
## 2 CBlock TA TA No Rec 468
## 3 CBlock TA TA No ALQ 923
## 4 CBlock TA TA No ALQ 1065
## 5 PConc Gd TA No GLQ 791
## 6 PConc TA TA No GLQ 602
## 7 PConc Gd TA Mn GLQ 616
## 8 PConc Gd TA No ALQ 263
## 9 PConc Gd TA No GLQ 1180
## 10 PConc TA TA No Unf 0
## BsmtFin.Type.2 BsmtFin.SF.2 Bsmt.Unf.SF Total.Bsmt.SF Heating Heating.QC
## 1 Unf 0 441 1080 Gas Fa
## 2 LwQ 144 270 882 Gas TA
## 3 Unf 0 406 1329 Gas TA
## 4 Unf 0 1045 2110 Gas Ex
## 5 Unf 0 137 928 Gas Gd
## 6 Unf 0 324 926 Gas Ex
## 7 Unf 0 722 1338 Gas Ex
## 8 Unf 0 1017 1280 Gas Ex
## 9 Unf 0 415 1595 Gas Ex
## 10 Unf 0 994 994 Gas Gd
## Central.Air Electrical X1st.Flr.SF X2nd.Flr.SF Low.Qual.Fin.SF Gr.Liv.Area
## 1 Y SBrkr 1656 0 0 1656
## 2 Y SBrkr 896 0 0 896
## 3 Y SBrkr 1329 0 0 1329
## 4 Y SBrkr 2110 0 0 2110
## 5 Y SBrkr 928 701 0 1629
## 6 Y SBrkr 926 678 0 1604
## 7 Y SBrkr 1338 0 0 1338
## 8 Y SBrkr 1280 0 0 1280
## 9 Y SBrkr 1616 0 0 1616
## 10 Y SBrkr 1028 776 0 1804
## Bsmt.Full.Bath Bsmt.Half.Bath Full.Bath Half.Bath Bedroom.AbvGr
## 1 1 0 1 0 3
## 2 0 0 1 0 2
## 3 0 0 1 1 3
## 4 1 0 2 1 3
## 5 0 0 2 1 3
## 6 0 0 2 1 3
## 7 1 0 2 0 2
## 8 0 0 2 0 2
## 9 1 0 2 0 2
## 10 0 0 2 1 3
## Kitchen.AbvGr Kitchen.Qual TotRms.AbvGrd Functional Fireplaces Fireplace.Qu
## 1 1 TA 7 Typ 2 Gd
## 2 1 TA 5 Typ 0 None
## 3 1 Gd 6 Typ 0 None
## 4 1 Ex 8 Typ 2 TA
## 5 1 TA 6 Typ 1 TA
## 6 1 Gd 7 Typ 1 Gd
## 7 1 Gd 6 Typ 0 None
## 8 1 Gd 5 Typ 0 None
## 9 1 Gd 5 Typ 1 TA
## 10 1 Gd 7 Typ 1 TA
## Garage.Type Garage.Yr.Blt Garage.Finish Garage.Cars Garage.Area Garage.Qual
## 1 Attchd 1960 Fin 2 528 TA
## 2 Attchd 1961 Unf 1 730 TA
## 3 Attchd 1958 Unf 1 312 TA
## 4 Attchd 1968 Fin 2 522 TA
## 5 Attchd 1997 Fin 2 482 TA
## 6 Attchd 1998 Fin 2 470 TA
## 7 Attchd 2001 Fin 2 582 TA
## 8 Attchd 1992 RFn 2 506 TA
## 9 Attchd 1995 RFn 2 608 TA
## 10 Attchd 1999 Fin 2 442 TA
## Garage.Cond Paved.Drive Wood.Deck.SF Open.Porch.SF Enclosed.Porch
## 1 TA P 210 62 0
## 2 TA Y 140 0 0
## 3 TA Y 393 36 0
## 4 TA Y 0 0 0
## 5 TA Y 212 34 0
## 6 TA Y 360 36 0
## 7 TA Y 0 0 170
## 8 TA Y 0 82 0
## 9 TA Y 237 152 0
## 10 TA Y 140 60 0
## X3Ssn.Porch Screen.Porch Pool.Area Fence Misc.Val Yr.Sold Sale.Type
## 1 0 0 0 None 0 2010 WD
## 2 0 120 0 MnPrv 0 2010 WD
## 3 0 0 0 None 12500 2010 WD
## 4 0 0 0 None 0 2010 WD
## 5 0 0 0 MnPrv 0 2010 WD
## 6 0 0 0 None 0 2010 WD
## 7 0 0 0 None 0 2010 WD
## 8 0 144 0 None 0 2010 WD
## 9 0 0 0 None 0 2010 WD
## 10 0 0 0 None 0 2010 WD
## Sale.Condition SalePrice
## 1 Normal 215000
## 2 Normal 105000
## 3 Normal 172000
## 4 Normal 244000
## 5 Normal 189900
## 6 Normal 195500
## 7 Normal 213500
## 8 Normal 191500
## 9 Normal 236500
## 10 Normal 189000
# Look at structure of dataframe:
str(data)
## 'data.frame': 2925 obs. of 74 variables:
## $ MS.Zoning : chr "RL" "RH" "RL" "RL" ...
## $ Lot.Frontage : int 141 80 81 93 74 78 41 43 39 60 ...
## $ Lot.Area : int 31770 11622 14267 11160 13830 9978 4920 5005 5389 7500 ...
## $ Street : chr "Pave" "Pave" "Pave" "Pave" ...
## $ Alley : chr "None" "None" "None" "None" ...
## $ Lot.Shape : chr "IR1" "Reg" "IR1" "Reg" ...
## $ Land.Contour : chr "Lvl" "Lvl" "Lvl" "Lvl" ...
## $ Lot.Config : chr "Corner" "Inside" "Corner" "Corner" ...
## $ Land.Slope : chr "Gtl" "Gtl" "Gtl" "Gtl" ...
## $ Condition.1 : chr "Norm" "Feedr" "Norm" "Norm" ...
## $ Condition.2 : chr "Norm" "Norm" "Norm" "Norm" ...
## $ Bldg.Type : chr "1Fam" "1Fam" "1Fam" "1Fam" ...
## $ House.Style : chr "1Story" "1Story" "1Story" "1Story" ...
## $ Overall.Qual : int 6 5 6 7 5 6 8 8 8 7 ...
## $ Overall.Cond : int 5 6 6 5 5 6 5 5 5 5 ...
## $ Year.Built : int 1960 1961 1958 1968 1997 1998 2001 1992 1995 1999 ...
## $ Year.Remod.Add : int 1960 1961 1958 1968 1998 1998 2001 1992 1996 1999 ...
## $ Roof.Style : chr "Hip" "Gable" "Hip" "Hip" ...
## $ Roof.Matl : chr "CompShg" "CompShg" "CompShg" "CompShg" ...
## $ Exterior.1st : chr "BrkFace" "VinylSd" "Wood" "BrkFace" ...
## $ Exterior.2nd : chr "Plywood" "VinylSd" "wood" "BrkFace" ...
## $ Mas.Vnr.Type : chr "Stone" "None" "BrkFace" "None" ...
## $ Mas.Vnr.Area : int 112 0 108 0 0 20 0 0 0 0 ...
## $ Exter.Qual : chr "TA" "TA" "TA" "Gd" ...
## $ Exter.Cond : chr "TA" "TA" "TA" "TA" ...
## $ Foundation : chr "CBlock" "CBlock" "CBlock" "CBlock" ...
## $ Bsmt.Qual : chr "TA" "TA" "TA" "TA" ...
## $ Bsmt.Cond : chr "Gd" "TA" "TA" "TA" ...
## $ Bsmt.Exposure : chr "Gd" "No" "No" "No" ...
## $ BsmtFin.Type.1 : chr "BLQ" "Rec" "ALQ" "ALQ" ...
## $ BsmtFin.SF.1 : int 639 468 923 1065 791 602 616 263 1180 0 ...
## $ BsmtFin.Type.2 : chr "Unf" "LwQ" "Unf" "Unf" ...
## $ BsmtFin.SF.2 : int 0 144 0 0 0 0 0 0 0 0 ...
## $ Bsmt.Unf.SF : int 441 270 406 1045 137 324 722 1017 415 994 ...
## $ Total.Bsmt.SF : int 1080 882 1329 2110 928 926 1338 1280 1595 994 ...
## $ Heating : chr "Gas" "Gas" "Gas" "Gas" ...
## $ Heating.QC : chr "Fa" "TA" "TA" "Ex" ...
## $ Central.Air : chr "Y" "Y" "Y" "Y" ...
## $ Electrical : chr "SBrkr" "SBrkr" "SBrkr" "SBrkr" ...
## $ X1st.Flr.SF : int 1656 896 1329 2110 928 926 1338 1280 1616 1028 ...
## $ X2nd.Flr.SF : int 0 0 0 0 701 678 0 0 0 776 ...
## $ Low.Qual.Fin.SF: int 0 0 0 0 0 0 0 0 0 0 ...
## $ Gr.Liv.Area : int 1656 896 1329 2110 1629 1604 1338 1280 1616 1804 ...
## $ Bsmt.Full.Bath : int 1 0 0 1 0 0 1 0 1 0 ...
## $ Bsmt.Half.Bath : int 0 0 0 0 0 0 0 0 0 0 ...
## $ Full.Bath : int 1 1 1 2 2 2 2 2 2 2 ...
## $ Half.Bath : int 0 0 1 1 1 1 0 0 0 1 ...
## $ Bedroom.AbvGr : int 3 2 3 3 3 3 2 2 2 3 ...
## $ Kitchen.AbvGr : int 1 1 1 1 1 1 1 1 1 1 ...
## $ Kitchen.Qual : chr "TA" "TA" "Gd" "Ex" ...
## $ TotRms.AbvGrd : int 7 5 6 8 6 7 6 5 5 7 ...
## $ Functional : chr "Typ" "Typ" "Typ" "Typ" ...
## $ Fireplaces : int 2 0 0 2 1 1 0 0 1 1 ...
## $ Fireplace.Qu : chr "Gd" "None" "None" "TA" ...
## $ Garage.Type : chr "Attchd" "Attchd" "Attchd" "Attchd" ...
## $ Garage.Yr.Blt : int 1960 1961 1958 1968 1997 1998 2001 1992 1995 1999 ...
## $ Garage.Finish : chr "Fin" "Unf" "Unf" "Fin" ...
## $ Garage.Cars : int 2 1 1 2 2 2 2 2 2 2 ...
## $ Garage.Area : int 528 730 312 522 482 470 582 506 608 442 ...
## $ Garage.Qual : chr "TA" "TA" "TA" "TA" ...
## $ Garage.Cond : chr "TA" "TA" "TA" "TA" ...
## $ Paved.Drive : chr "P" "Y" "Y" "Y" ...
## $ Wood.Deck.SF : int 210 140 393 0 212 360 0 0 237 140 ...
## $ Open.Porch.SF : int 62 0 36 0 34 36 0 82 152 60 ...
## $ Enclosed.Porch : int 0 0 0 0 0 0 170 0 0 0 ...
## $ X3Ssn.Porch : int 0 0 0 0 0 0 0 0 0 0 ...
## $ Screen.Porch : int 0 120 0 0 0 0 0 144 0 0 ...
## $ Pool.Area : int 0 0 0 0 0 0 0 0 0 0 ...
## $ Fence : chr "None" "MnPrv" "None" "None" ...
## $ Misc.Val : int 0 0 12500 0 0 0 0 0 0 0 ...
## $ Yr.Sold : int 2010 2010 2010 2010 2010 2010 2010 2010 2010 2010 ...
## $ Sale.Type : chr "WD " "WD " "WD " "WD " ...
## $ Sale.Condition : chr "Normal" "Normal" "Normal" "Normal" ...
## $ SalePrice : int 215000 105000 172000 244000 189900 195500 213500 191500 236500 189000 ...
# Look at missing values in dataframe:
summary(data)
## MS.Zoning Lot.Frontage Lot.Area Street
## Length:2925 Min. : 21.00 Min. : 1300 Length:2925
## Class :character 1st Qu.: 58.00 1st Qu.: 7438 Class :character
## Mode :character Median : 68.00 Median : 9428 Mode :character
## Mean : 69.07 Mean : 10108
## 3rd Qu.: 80.00 3rd Qu.: 11520
## Max. :313.00 Max. :215245
## NA's :490
## Alley Lot.Shape Land.Contour Lot.Config
## Length:2925 Length:2925 Length:2925 Length:2925
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
##
##
##
##
## Land.Slope Condition.1 Condition.2 Bldg.Type
## Length:2925 Length:2925 Length:2925 Length:2925
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
##
##
##
##
## House.Style Overall.Qual Overall.Cond Year.Built
## Length:2925 Min. : 1.000 Min. :1.000 Min. :1872
## Class :character 1st Qu.: 5.000 1st Qu.:5.000 1st Qu.:1954
## Mode :character Median : 6.000 Median :5.000 Median :1973
## Mean : 6.094 Mean :5.565 Mean :1971
## 3rd Qu.: 7.000 3rd Qu.:6.000 3rd Qu.:2001
## Max. :10.000 Max. :9.000 Max. :2010
##
## Year.Remod.Add Roof.Style Roof.Matl Exterior.1st
## Min. :1950 Length:2925 Length:2925 Length:2925
## 1st Qu.:1965 Class :character Class :character Class :character
## Median :1993 Mode :character Mode :character Mode :character
## Mean :1984
## 3rd Qu.:2004
## Max. :2010
##
## Exterior.2nd Mas.Vnr.Type Mas.Vnr.Area Exter.Qual
## Length:2925 Length:2925 Min. : 0.0 Length:2925
## Class :character Class :character 1st Qu.: 0.0 Class :character
## Mode :character Mode :character Median : 0.0 Mode :character
## Mean : 101.1
## 3rd Qu.: 164.0
## Max. :1600.0
## NA's :23
## Exter.Cond Foundation Bsmt.Qual Bsmt.Cond
## Length:2925 Length:2925 Length:2925 Length:2925
## Class :character Class :character Class :character Class :character
## Mode :character Mode :character Mode :character Mode :character
##
##
##
##
## Bsmt.Exposure BsmtFin.Type.1 BsmtFin.SF.1 BsmtFin.Type.2
## Length:2925 Length:2925 Min. : 0.0 Length:2925
## Class :character Class :character 1st Qu.: 0.0 Class :character
## Mode :character Mode :character Median : 370.0 Mode :character
## Mean : 439.3
## 3rd Qu.: 734.0
## Max. :2288.0
## NA's :1
## BsmtFin.SF.2 Bsmt.Unf.SF Total.Bsmt.SF Heating
## Min. : 0.00 Min. : 0.0 Min. : 0 Length:2925
## 1st Qu.: 0.00 1st Qu.: 219.0 1st Qu.: 793 Class :character
## Median : 0.00 Median : 464.5 Median : 990 Mode :character
## Mean : 49.81 Mean : 559.2 Mean :1048
## 3rd Qu.: 0.00 3rd Qu.: 801.2 3rd Qu.:1300
## Max. :1526.00 Max. :2336.0 Max. :3206
## NA's :1 NA's :1 NA's :1
## Heating.QC Central.Air Electrical X1st.Flr.SF
## Length:2925 Length:2925 Length:2925 Min. : 334
## Class :character Class :character Class :character 1st Qu.: 877
## Mode :character Mode :character Mode :character Median :1084
## Mean :1157
## 3rd Qu.:1383
## Max. :3820
##
## X2nd.Flr.SF Low.Qual.Fin.SF Gr.Liv.Area Bsmt.Full.Bath
## Min. : 0.0 Min. : 0.000 Min. : 334 Min. :0.0000
## 1st Qu.: 0.0 1st Qu.: 0.000 1st Qu.:1126 1st Qu.:0.0000
## Median : 0.0 Median : 0.000 Median :1442 Median :0.0000
## Mean : 335.2 Mean : 4.685 Mean :1496 Mean :0.4307
## 3rd Qu.: 703.0 3rd Qu.: 0.000 3rd Qu.:1742 3rd Qu.:1.0000
## Max. :2065.0 Max. :1064.000 Max. :4476 Max. :3.0000
## NA's :2
## Bsmt.Half.Bath Full.Bath Half.Bath Bedroom.AbvGr
## Min. :0.0000 Min. :0.000 Min. :0.0000 Min. :0.000
## 1st Qu.:0.0000 1st Qu.:1.000 1st Qu.:0.0000 1st Qu.:2.000
## Median :0.0000 Median :2.000 Median :0.0000 Median :3.000
## Mean :0.0609 Mean :1.566 Mean :0.3791 Mean :2.855
## 3rd Qu.:0.0000 3rd Qu.:2.000 3rd Qu.:1.0000 3rd Qu.:3.000
## Max. :2.0000 Max. :4.000 Max. :2.0000 Max. :8.000
## NA's :2
## Kitchen.AbvGr Kitchen.Qual TotRms.AbvGrd Functional
## Min. :0.000 Length:2925 Min. : 2.000 Length:2925
## 1st Qu.:1.000 Class :character 1st Qu.: 5.000 Class :character
## Median :1.000 Mode :character Median : 6.000 Mode :character
## Mean :1.044 Mean : 6.438
## 3rd Qu.:1.000 3rd Qu.: 7.000
## Max. :3.000 Max. :14.000
##
## Fireplaces Fireplace.Qu Garage.Type Garage.Yr.Blt
## Min. :0.0000 Length:2925 Length:2925 Min. :1895
## 1st Qu.:0.0000 Class :character Class :character 1st Qu.:1960
## Median :1.0000 Mode :character Mode :character Median :1979
## Mean :0.5979 Mean :1978
## 3rd Qu.:1.0000 3rd Qu.:2002
## Max. :4.0000 Max. :2207
## NA's :159
## Garage.Finish Garage.Cars Garage.Area Garage.Qual
## Length:2925 Min. :0.000 Min. : 0 Length:2925
## Class :character 1st Qu.:1.000 1st Qu.: 320 Class :character
## Mode :character Median :2.000 Median : 480 Mode :character
## Mean :1.766 Mean : 472
## 3rd Qu.:2.000 3rd Qu.: 576
## Max. :5.000 Max. :1488
## NA's :1 NA's :1
## Garage.Cond Paved.Drive Wood.Deck.SF Open.Porch.SF
## Length:2925 Length:2925 Min. : 0.00 Min. : 0.00
## Class :character Class :character 1st Qu.: 0.00 1st Qu.: 0.00
## Mode :character Mode :character Median : 0.00 Median : 27.00
## Mean : 93.58 Mean : 47.21
## 3rd Qu.: 168.00 3rd Qu.: 70.00
## Max. :1424.00 Max. :742.00
##
## Enclosed.Porch X3Ssn.Porch Screen.Porch Pool.Area
## Min. : 0.00 Min. : 0.000 Min. : 0.00 Min. : 0.000
## 1st Qu.: 0.00 1st Qu.: 0.000 1st Qu.: 0.00 1st Qu.: 0.000
## Median : 0.00 Median : 0.000 Median : 0.00 Median : 0.000
## Mean : 23.05 Mean : 2.597 Mean : 16.03 Mean : 2.083
## 3rd Qu.: 0.00 3rd Qu.: 0.000 3rd Qu.: 0.00 3rd Qu.: 0.000
## Max. :1012.00 Max. :508.000 Max. :576.00 Max. :800.000
##
## Fence Misc.Val Yr.Sold Sale.Type
## Length:2925 Min. : 0.00 Min. :2006 Length:2925
## Class :character 1st Qu.: 0.00 1st Qu.:2007 Class :character
## Mode :character Median : 0.00 Median :2008 Mode :character
## Mean : 44.91 Mean :2008
## 3rd Qu.: 0.00 3rd Qu.:2009
## Max. :15500.00 Max. :2010
##
## Sale.Condition SalePrice
## Length:2925 Min. : 34900
## Class :character 1st Qu.:129500
## Mode :character Median :160000
## Mean :180916
## 3rd Qu.:213500
## Max. :755000
##
# Remove Missing Values from Data:
data2= na.omit(data)
# check structure of dataframe:
str(data2)
## 'data.frame': 2258 obs. of 74 variables:
## $ MS.Zoning : chr "RL" "RH" "RL" "RL" ...
## $ Lot.Frontage : int 141 80 81 93 74 78 41 43 39 60 ...
## $ Lot.Area : int 31770 11622 14267 11160 13830 9978 4920 5005 5389 7500 ...
## $ Street : chr "Pave" "Pave" "Pave" "Pave" ...
## $ Alley : chr "None" "None" "None" "None" ...
## $ Lot.Shape : chr "IR1" "Reg" "IR1" "Reg" ...
## $ Land.Contour : chr "Lvl" "Lvl" "Lvl" "Lvl" ...
## $ Lot.Config : chr "Corner" "Inside" "Corner" "Corner" ...
## $ Land.Slope : chr "Gtl" "Gtl" "Gtl" "Gtl" ...
## $ Condition.1 : chr "Norm" "Feedr" "Norm" "Norm" ...
## $ Condition.2 : chr "Norm" "Norm" "Norm" "Norm" ...
## $ Bldg.Type : chr "1Fam" "1Fam" "1Fam" "1Fam" ...
## $ House.Style : chr "1Story" "1Story" "1Story" "1Story" ...
## $ Overall.Qual : int 6 5 6 7 5 6 8 8 8 7 ...
## $ Overall.Cond : int 5 6 6 5 5 6 5 5 5 5 ...
## $ Year.Built : int 1960 1961 1958 1968 1997 1998 2001 1992 1995 1999 ...
## $ Year.Remod.Add : int 1960 1961 1958 1968 1998 1998 2001 1992 1996 1999 ...
## $ Roof.Style : chr "Hip" "Gable" "Hip" "Hip" ...
## $ Roof.Matl : chr "CompShg" "CompShg" "CompShg" "CompShg" ...
## $ Exterior.1st : chr "BrkFace" "VinylSd" "Wood" "BrkFace" ...
## $ Exterior.2nd : chr "Plywood" "VinylSd" "wood" "BrkFace" ...
## $ Mas.Vnr.Type : chr "Stone" "None" "BrkFace" "None" ...
## $ Mas.Vnr.Area : int 112 0 108 0 0 20 0 0 0 0 ...
## $ Exter.Qual : chr "TA" "TA" "TA" "Gd" ...
## $ Exter.Cond : chr "TA" "TA" "TA" "TA" ...
## $ Foundation : chr "CBlock" "CBlock" "CBlock" "CBlock" ...
## $ Bsmt.Qual : chr "TA" "TA" "TA" "TA" ...
## $ Bsmt.Cond : chr "Gd" "TA" "TA" "TA" ...
## $ Bsmt.Exposure : chr "Gd" "No" "No" "No" ...
## $ BsmtFin.Type.1 : chr "BLQ" "Rec" "ALQ" "ALQ" ...
## $ BsmtFin.SF.1 : int 639 468 923 1065 791 602 616 263 1180 0 ...
## $ BsmtFin.Type.2 : chr "Unf" "LwQ" "Unf" "Unf" ...
## $ BsmtFin.SF.2 : int 0 144 0 0 0 0 0 0 0 0 ...
## $ Bsmt.Unf.SF : int 441 270 406 1045 137 324 722 1017 415 994 ...
## $ Total.Bsmt.SF : int 1080 882 1329 2110 928 926 1338 1280 1595 994 ...
## $ Heating : chr "Gas" "Gas" "Gas" "Gas" ...
## $ Heating.QC : chr "Fa" "TA" "TA" "Ex" ...
## $ Central.Air : chr "Y" "Y" "Y" "Y" ...
## $ Electrical : chr "SBrkr" "SBrkr" "SBrkr" "SBrkr" ...
## $ X1st.Flr.SF : int 1656 896 1329 2110 928 926 1338 1280 1616 1028 ...
## $ X2nd.Flr.SF : int 0 0 0 0 701 678 0 0 0 776 ...
## $ Low.Qual.Fin.SF: int 0 0 0 0 0 0 0 0 0 0 ...
## $ Gr.Liv.Area : int 1656 896 1329 2110 1629 1604 1338 1280 1616 1804 ...
## $ Bsmt.Full.Bath : int 1 0 0 1 0 0 1 0 1 0 ...
## $ Bsmt.Half.Bath : int 0 0 0 0 0 0 0 0 0 0 ...
## $ Full.Bath : int 1 1 1 2 2 2 2 2 2 2 ...
## $ Half.Bath : int 0 0 1 1 1 1 0 0 0 1 ...
## $ Bedroom.AbvGr : int 3 2 3 3 3 3 2 2 2 3 ...
## $ Kitchen.AbvGr : int 1 1 1 1 1 1 1 1 1 1 ...
## $ Kitchen.Qual : chr "TA" "TA" "Gd" "Ex" ...
## $ TotRms.AbvGrd : int 7 5 6 8 6 7 6 5 5 7 ...
## $ Functional : chr "Typ" "Typ" "Typ" "Typ" ...
## $ Fireplaces : int 2 0 0 2 1 1 0 0 1 1 ...
## $ Fireplace.Qu : chr "Gd" "None" "None" "TA" ...
## $ Garage.Type : chr "Attchd" "Attchd" "Attchd" "Attchd" ...
## $ Garage.Yr.Blt : int 1960 1961 1958 1968 1997 1998 2001 1992 1995 1999 ...
## $ Garage.Finish : chr "Fin" "Unf" "Unf" "Fin" ...
## $ Garage.Cars : int 2 1 1 2 2 2 2 2 2 2 ...
## $ Garage.Area : int 528 730 312 522 482 470 582 506 608 442 ...
## $ Garage.Qual : chr "TA" "TA" "TA" "TA" ...
## $ Garage.Cond : chr "TA" "TA" "TA" "TA" ...
## $ Paved.Drive : chr "P" "Y" "Y" "Y" ...
## $ Wood.Deck.SF : int 210 140 393 0 212 360 0 0 237 140 ...
## $ Open.Porch.SF : int 62 0 36 0 34 36 0 82 152 60 ...
## $ Enclosed.Porch : int 0 0 0 0 0 0 170 0 0 0 ...
## $ X3Ssn.Porch : int 0 0 0 0 0 0 0 0 0 0 ...
## $ Screen.Porch : int 0 120 0 0 0 0 0 144 0 0 ...
## $ Pool.Area : int 0 0 0 0 0 0 0 0 0 0 ...
## $ Fence : chr "None" "MnPrv" "None" "None" ...
## $ Misc.Val : int 0 0 12500 0 0 0 0 0 0 0 ...
## $ Yr.Sold : int 2010 2010 2010 2010 2010 2010 2010 2010 2010 2010 ...
## $ Sale.Type : chr "WD " "WD " "WD " "WD " ...
## $ Sale.Condition : chr "Normal" "Normal" "Normal" "Normal" ...
## $ SalePrice : int 215000 105000 172000 244000 189900 195500 213500 191500 236500 189000 ...
## - attr(*, "na.action")= 'omit' Named int [1:667] 12 15 23 24 25 28 56 58 59 67 ...
## ..- attr(*, "names")= chr [1:667] "12" "15" "23" "24" ...
# Split Training Set 70/30
train <- sample(2258,1800)
test <- (c(1:2258)[-train])
# Create a data frame with continuous variables only:
num.ames=data.frame(data2[,c(2,3,14:17,23,31,33:35,40:49,51,53,56,58,59,63:68,70,71,74)])
# Checking Data Correlation and Distribution:
plot(SalePrice ~., data = num.ames, subset = train)

































